dev_InvertedDoublePendulum-v1


#ResultTotal_EpEntropyGae_LamTraining_TimingTest_N_IterTotal_StepsTest_RewardEnvKl_DivMomentumTotal_TimeCg_DampingTimesteps_Per_BatchTest_TimingDeltaGaeN_IterFilterSolvedExpAvg_RewardMax_Path_LengthGammaSurr_Loss
1488.985486638[2548, 4715, 6558, 8284, 10174, 12065, 13718, 1...[1.3461916447, 1.2696986198, 1.1220554113, 0.91...0.973380.78307509100[15000, 30000, 45000, 60000, 75000, 90000, 1050...48898.5486638InvertedDoublePendulum-v1...[0.0442264564, 0.1474678367, 0.1986001283, 0.12...0.9052906515[14.005687952, 26.4445948601, 38.3016319275, 49...0.1150003.347096920.01True300True950.0dev[53.3233776124, 62.9650133305, 74.3754830892, 7...50000.99[-0.0656886995, -0.1375486553, -0.0815420747, -...Download
2578.061345657[2548, 4715, 6541, 8419, 10474, 12500, 14406, 1...[1.3461916447, 1.2729489803, 1.0493670702, 0.84...0.973408.16854596100[15000, 30000, 45000, 60000, 75000, 90000, 1050...57806.1345657InvertedDoublePendulum-v1...[0.0442264564, 0.1408879161, 0.2408334017, 0.12...0.8679054258[14.9499878883, 27.6219718456, 39.4206898212, 5...0.1150004.15686392780.01True300True950.0dev[53.3233776124, 62.9650133305, 75.0642430707, 7...50000.99[-0.0656886995, -0.1352116764, -0.0646118969, -...Download
3746.40732187[2548, 4715, 6613, 8478, 10240, 11874, 13344, 1...[1.3461916447, 1.3081080914, 1.3647431135, 1.39...0.973268.82720089100[15000, 30000, 45000, 60000, 75000, 90000, 1050...74640.732187InvertedDoublePendulum-v1...[0.0442264564, 0.0818773732, 0.0641594753, 0.05...0.4638048044[14.9572029114, 27.8737409115, 40.0754570961, 5...0.1150005.21989989280.01True300True950.0dev[53.3233776124, 62.9650133305, 72.1362728888, 7...50000.99[-0.0656886995, -0.1076418459, -0.0480623171, -...Download
4847.349728908[2548, 4715, 6631, 8423, 10121, 11796, 13320, 1...[1.3461916447, 1.3076579571, 1.3938522339, 1.49...0.973193.05432796100[15000, 30000, 45000, 60000, 75000, 90000, 1050...84734.9728908InvertedDoublePendulum-v1...[0.0442264564, 0.0824700221, 0.0518238619, 0.06...0.468732842[14.7649440765, 27.1752290726, 39.0949010849, 5...0.1150006.16070508960.01True300True950.0dev[53.3233776124, 62.9650133305, 71.4546177176, 7...50000.99[-0.0656886995, -0.1080022529, -0.0430226661, -...Download
5980.869885577[2548, 4715, 6605, 8322, 10051, 11807, 13400, 1...[1.3461916447, 1.3007307053, 1.1112821102, 1.01...0.973239.14985394100[15000, 30000, 45000, 60000, 75000, 90000, 1050...98086.9885577InvertedDoublePendulum-v1...[0.0442264564, 0.0926024839, 0.0703018233, 0.08...0.549406131[14.3370330334, 26.2276480198, 38.1985800266, 5...0.1150006.2667698860.01True300True950.0dev[53.3233776124, 62.9650133305, 72.467059581, 80...50000.99[-0.0656886995, -0.1138220653, -0.0761752278, -...Download
61275.28249928[2548, 4715, 6647, 8407, 10071, 11842, 13481, 1...[1.3461916447, 1.3223040104, 1.1328006983, 0.96...0.973299.27640581100[15000, 30000, 45000, 60000, 75000, 90000, 1050...127528.249928InvertedDoublePendulum-v1...[0.0442264564, 0.0639006197, 0.0555282645, 0.08...0.3006138187[14.8109779358, 27.5584180355, 40.1458580494, 5...0.1150009.05705404280.01True300True950.0dev[53.3233776124, 62.9650133305, 70.8523806575, 7...50000.99[-0.0656886995, -0.0953896195, -0.0701108724, -...Download
71397.38377768[2548, 4715, 6653, 8524, 10504, 12378, 14031, 1...[1.3461916447, 1.3287755251, 1.2375167608, 1.09...0.973303.41119003100[15000, 30000, 45000, 60000, 75000, 90000, 1050...139738.377768InvertedDoublePendulum-v1...[0.0442264564, 0.0567731485, 0.0694540367, 0.04...0.2265854833[14.649974823, 26.7792508602, 38.8349628448, 50...0.1150009.31136417390.01True300True950.0dev[53.3233776124, 62.9650133305, 70.614021377, 73...50000.99[-0.0656886995, -0.0896390527, -0.0674440414, -...Download
81494.60862232[2548, 4715, 6779, 8604, 10489, 12113, 13580, 1...[1.3461916447, 1.3747055531, 1.2034468651, 1.24...0.973253.511127100[15000, 30000, 45000, 60000, 75000, 90000, 1050...149460.862232InvertedDoublePendulum-v1...[0.0442264564, 0.0228590034, 0.0443908647, 0.03...-0.3014089875[14.4210429192, 27.3446588516, 39.4706568718, 5...0.11500010.78666591640.01True300True950.0dev[53.3233776124, 62.9650133305, 66.1986887662, 7...50000.99[-0.0656886995, -0.0456668995, -0.0742566735, 0...Download
91691.07529888[2548, 4715, 6608, 8415, 10257, 11971, 13449, 1...[1.3461916447, 1.3108348846, 1.1118278503, 0.89...0.973280.9995141100[15000, 30000, 45000, 60000, 75000, 90000, 1050...169107.529888InvertedDoublePendulum-v1...[0.0442264564, 0.0782235935, 0.0760113597, 0.09...0.4328650041[15.020004034, 27.6153738499, 40.1609508991, 52...0.11500011.52089405060.01True300True950.0dev[53.3233776124, 62.9650133305, 72.3433370478, 7...50000.99[-0.0656886995, -0.1053652912, -0.0682567731, -...Download
101803.02235177[2548, 4715, 6674, 8451, 10060, 11564, 12906, 1...[1.3461916447, 1.336463809, 1.1657418013, 1.021...0.973269.21360302100[15000, 30000, 45000, 60000, 75000, 90000, 1050...180302.235177InvertedDoublePendulum-v1...[0.0442264564, 0.0490537584, 0.0521676987, 0.05...0.1380018843[14.0766911507, 27.8995251656, 40.4443380833, 5...0.11500012.8073799610.01True300True950.0dev[53.3233776124, 62.9650133305, 69.8451393834, 7...50000.99[-0.0656886995, -0.0826095194, -0.0712597817, -...Download
112019.35492989[2548, 4715, 6631, 8339, 10028, 11848, 13696, 1...[1.3461916447, 1.3155937195, 1.2314862013, 1.10...0.974085.51687098100[15000, 30000, 45000, 60000, 75000, 90000, 1050...201935.492989InvertedDoublePendulum-v1...[0.0442264564, 0.0720223635, 0.0696854964, 0.10...0.3779335026[18.0965819359, 33.6612989902, 48.8399708271, 6...0.11500017.24236512180.01True300True950.0dev[53.3233776124, 62.9650133305, 71.4536947795, 8...50000.99[-0.0656886995, -0.1012694314, -0.0803958476, -...Download
122293.77272859[2548, 4715, 6657, 8386, 9982, 11400, 12721, 14...[1.3461916447, 1.3261333704, 1.1990517378, 1.05...0.973222.54625106100[15000, 30000, 45000, 60000, 75000, 90000, 1050...229377.272859InvertedDoublePendulum-v1...[0.0442264564, 0.059665639, 0.0667033643, 0.077...0.2574165326[14.5856609344, 26.5904729366, 38.5611259937, 5...0.11500015.66797685620.01True300True950.0dev[53.3233776124, 62.9650133305, 70.4674589142, 7...50000.99[-0.0656886995, -0.0920481086, -0.0868960917, -...Download
133574.82356359[2548, 4715, 6634, 8424, 10190, 11854, 13352, 1...[1.3461916447, 1.3168848753, 1.1706707478, 1.03...0.973272.16654491100[15000, 30000, 45000, 60000, 75000, 90000, 1050...357482.356359InvertedDoublePendulum-v1...[0.0442264564, 0.0704509914, 0.0778285861, 0.08...0.3634831978[11.9859418869, 24.1982939243, 36.38438797, 48....0.11500024.12776994710.01True300True950.0dev[53.3233776124, 62.9650133305, 71.3400796536, 7...50000.99[-0.0656886995, -0.1001806259, -0.0691949055, -...Download
144117.54954188[2548, 4715, 6657, 8508, 10531, 12592, 14401, 1...[1.3461916447, 1.3276264668, 1.147158742, 1.117...0.973276.41035819100[15000, 30000, 45000, 60000, 75000, 90000, 1050...411754.954188InvertedDoublePendulum-v1...[0.0442264564, 0.0580414347, 0.0590459481, 0.04...0.2402458126[15.2485780716, 27.8988001347, 41.0152981281, 5...0.11500028.32573413850.01True300True950.0dev[53.3233776124, 62.9650133305, 70.4610273848, 7...50000.99[-0.0656886995, -0.0907088816, -0.0579038486, -...Download
155188.47084125[2548, 4715, 6647, 8407, 10089, 11831, 13505, 1...[1.3461916447, 1.3223041296, 1.1328011751, 0.96...0.973230.12983799100[15000, 30000, 45000, 60000, 75000, 90000, 1050...518847.084125InvertedDoublePendulum-v1...[0.0442264564, 0.0638979971, 0.0555260293, 0.08...0.3005876229[13.7551670074, 26.0661308765, 37.6126208305, 4...0.11500035.89605998990.01True300True950.0dev[53.3233776124, 62.9650133305, 70.8523669984, 7...50000.99[-0.0656886995, -0.0953876823, -0.0701118782, -...Download
166145.07414374[2548, 4715, 6631, 8470, 10243, 12165, 14080, 1...[1.3461916447, 1.3247044086, 1.2450668812, 1.23...0.973262.79607511100[15000, 30000, 45000, 60000, 75000, 90000, 1050...614507.414374InvertedDoublePendulum-v1...[0.0442264564, 0.0612287745, 0.0737323239, 0.04...0.2736163946[14.4505040646, 26.9183309078, 38.6909408569, 5...0.11500040.48134684560.01True300True950.0dev[53.3233776124, 62.9650133305, 71.4358105203, 7...50000.99[-0.0656886995, -0.0933059081, -0.0690840632, -...Download
1710153.286208[2548, 4715, 6592, 8388, 10036, 11520, 12854, 1...[1.3461916447, 1.3044950962, 1.3416006565, 1.38...0.973256.62781215100[15000, 30000, 45000, 60000, 75000, 90000, 1050...1015328.6208InvertedDoublePendulum-v1...[0.0442264564, 0.0869955793, 0.0663658455, 0.07...0.5055667331[14.8153440952, 27.1714110374, 39.2677080631, 5...0.11500069.83876013760.01True300True950.0dev[53.3233776124, 62.9650133305, 72.9687076078, 7...50000.99[-0.0656886995, -0.1106788069, -0.0579471104, -...Download
1811075.1788445[2548, 4715, 6661, 8436, 10048, 11565, 12985, 1...[1.3461916447, 1.3349226713, 1.1650505066, 1.01...0.973304.23068595100[15000, 30000, 45000, 60000, 75000, 90000, 1050...1107517.88445InvertedDoublePendulum-v1...[0.0442264564, 0.0505920127, 0.0539808497, 0.05...0.1564748936[14.6978840828, 26.827559948, 38.9791250229, 51...0.11500076.19383096690.01True300True950.0dev[53.3233776124, 62.9650133305, 70.3135195621, 7...50000.99[-0.0656886995, -0.0840882435, -0.0714026913, -...Download
1911377.0878989[2548, 4715, 6633, 8585, 10330, 12102, 14029, 1...[1.3461916447, 1.3251835108, 1.2898736, 1.13823...0.973221.61264491100[15000, 30000, 45000, 60000, 75000, 90000, 1050...1137708.78989InvertedDoublePendulum-v1...[0.0442264564, 0.0607159697, 0.0081370836, 0.04...0.2683365772[14.4271709919, 26.679571867, 39.2260408401, 51...0.11500077.09018301960.01True300True950.0dev[53.3233776124, 62.9650133305, 71.3702992108, 7...50000.99[-0.0656886995, -0.0928966403, -0.0019305112, -...Download
2016954.2710901[2548, 4715, 6629, 8399, 9972, 11342, 12579, 13...[1.3461916447, 1.3191810846, 1.3831442595, 1.38...0.973167.4648819100[15000, 30000, 45000, 60000, 75000, 90000, 1050...1695427.10901InvertedDoublePendulum-v1...[0.0442264564, 0.0676134899, 0.0489983633, 0.05...0.3367918896[14.0851018429, 25.996901989, 37.6242179871, 49...0.115000115.2643089290.01True300True950.0dev[53.3233776124, 62.9650133305, 71.5274144027, 7...50000.99[-0.0656886995, -0.0981572345, -0.0506201796, -...Download
2126035.163333[2548, 4715, 6619, 8468, 10272, 11997, 13532, 1...[1.3461916447, 1.3076170683, 1.2856413126, 1.16...0.973238.23955798100[15000, 30000, 45000, 60000, 75000, 90000, 1050...2603516.3333InvertedDoublePendulum-v1...[0.0442264564, 0.0825850591, 0.0926983878, 0.10...0.4696863511[15.1162269115, 27.9347290993, 40.1560509205, 5...0.115000182.3103270530.01True300True950.0dev[53.3233776124, 62.9650133305, 71.9171636393, 7...50000.99[-0.0656886995, -0.1080719754, -0.06717816, -0....Download
2229937.1355468[2548, 4715, 6665, 8413, 9974, 11547, 13266, 15...[1.3461916447, 1.3285729885, 1.1445786953, 0.98...0.973305.37432504100[15000, 30000, 45000, 60000, 75000, 90000, 1050...2993713.55468InvertedDoublePendulum-v1...[0.0442264564, 0.0570379272, 0.049672462, 0.071...0.2294561927[14.2600910664, 26.7870049477, 38.9587759972, 5...0.115000211.6494569780.01True300True950.0dev[53.3233776124, 62.9650133305, 70.1728537694, 7...50000.99[-0.0656886995, -0.0898642614, -0.0692968592, -...Download
2332489.6279617[2548, 4715, 6711, 8455, 10115, 11726, 13237, 1...[1.3461916447, 1.3442283869, 1.1662302017, 1.15...0.973182.61307907100[15000, 30000, 45000, 60000, 75000, 90000, 1050...3248962.79617InvertedDoublePendulum-v1...[0.0442264564, 0.0421958007, 0.0450628139, 0.03...0.0495107258[14.2916829586, 26.6044359207, 38.5087718964, 5...0.115000221.8798329830.01True300True950.0dev[53.3233776124, 62.9650133305, 68.5041488032, 7...50000.99[-0.0656886995, -0.0754342154, -0.0697478056, -...Download
2433061.2963041[2548, 4715, 6726, 8596, 10247, 11703, 13012, 1...[1.3461916447, 1.3586930037, 1.1764820814, 1.07...0.973280.9642272100[15000, 30000, 45000, 60000, 75000, 90000, 1050...3306129.63041InvertedDoublePendulum-v1...[0.0442264564, 0.0315284394, 0.0461694822, 0.04...-0.1166045987[14.6926660538, 26.712553978, 38.9976379871, 51...0.115000221.3575870990.01True300True950.0dev[53.3233776124, 62.9650133305, 67.985810177, 73...50000.99[-0.0656886995, -0.0615856498, -0.044256296, -0...Download
2539246.685287[2548, 4715, 6715, 8500, 10105, 11775, 13456, 1...[1.3461916447, 1.3455450535, 1.188911438, 1.035...0.973204.76505899100[15000, 30000, 45000, 60000, 75000, 90000, 1050...3924668.5287InvertedDoublePendulum-v1...[0.0442264564, 0.041083809, 0.047282923, 0.0495...0.0340604238[14.6687691212, 27.3366270065, 39.775370121, 51...0.115000267.5085690020.01True300True950.0dev[53.3233776124, 62.9650133305, 68.3718775457, 7...50000.99[-0.0656886995, -0.0741665214, -0.0807759091, -...Download
2643707.4894839[2548, 4715, 6584, 8562, 10785, 12991, 15090, 1...[1.3461916447, 1.2843459845, 1.1594517231, 1.04...0.974109.12449813100[15000, 30000, 45000, 60000, 75000, 90000, 1050...4370748.94839InvertedDoublePendulum-v1...[0.0442264564, 0.1193841994, 0.1914270669, 0.05...0.7369532015[18.3353068829, 34.4484078884, 49.5475358963, 6...0.115000294.7322120670.01True300True950.0dev[53.3233776124, 62.9650133305, 73.3125618552, 6...50000.99[-0.0656886995, -0.1267330945, -0.0479240678, 0...Download
2748958.2904915[2548, 4715, 6634, 8396, 10165, 11978, 13647, 1...[1.3461916447, 1.3180236816, 1.3136698008, 1.39...0.973295.89623284100[15000, 30000, 45000, 60000, 75000, 90000, 1050...4895829.04915InvertedDoublePendulum-v1...[0.0442264564, 0.069041796, 0.0671408772, 0.053...0.3503258371[11.8676390648, 23.6481890678, 36.0670769215, 4...0.115000328.400992870.01True300True950.0dev[53.3233776124, 62.9650133305, 71.3290904618, 7...50000.99[-0.0656886995, -0.0991852432, -0.0711893886, -...Download
2850641.6094401[2548, 4715, 6646, 8554, 10252, 11775, 13100, 1...[1.3461916447, 1.317535162, 1.2781245708, 1.118...0.973265.40937185100[15000, 30000, 45000, 60000, 75000, 90000, 1050...5064160.94401InvertedDoublePendulum-v1...[0.0442264564, 0.0696473122, 0.0085488642, 0.05...0.3560025861[14.8955140114, 27.6319329739, 40.1490468979, 5...0.115000334.8671519760.01True300True950.0dev[53.3233776124, 62.9650133305, 70.8919735125, 7...50000.99[-0.0656886995, -0.0996151567, -0.0096561564, -...Download
2951231.5590037[2548, 4715, 6634, 8336, 9843, 11170, 12375, 13...[1.3461916447, 1.3183997869, 1.2045927048, 1.14...0.973200.56785917100[15000, 30000, 45000, 60000, 75000, 90000, 1050...5123155.90037InvertedDoublePendulum-v1...[0.0442264564, 0.0685196742, 0.0759307221, 0.06...0.3454022726[14.2567801476, 27.0329611301, 39.2209050655, 5...0.115000348.6160571570.01True300True950.0dev[53.3233776124, 62.9650133305, 71.3298378597, 8...50000.99[-0.0656886995, -0.0988116264, -0.088922821, -0...Download
3059267.7847537[2548, 4715, 6647, 8422, 10024, 11465, 12730, 1...[1.3461916447, 1.3229058981, 1.1333042383, 0.96...0.973265.26265407100[15000, 30000, 45000, 60000, 75000, 90000, 1050...5926778.47537InvertedDoublePendulum-v1...[0.0442264564, 0.0632621199, 0.056045711, 0.077...0.2942390065[15.3080999851, 27.6051940918, 40.2138659954, 5...0.115000406.8137569430.01True300True950.0dev[53.3233776124, 62.9650133305, 70.8480774269, 7...50000.99[-0.0656886995, -0.0948989838, -0.0683862194, -...Download
3166557.3809147[2548, 4715, 6750, 8627, 10311, 12047, 13951, 1...[1.3461916447, 1.353066802, 1.1740900278, 1.034...0.973250.24443197100[15000, 30000, 45000, 60000, 75000, 90000, 1050...6655738.09147InvertedDoublePendulum-v1...[0.0442264564, 0.0352909788, 0.044818081, 0.042...-0.0528399458[13.8723299503, 25.5926399231, 36.9437060356, 4...0.115000446.3974969390.01True300True950.0dev[53.3233776124, 62.9650133305, 67.1708408188, 7...50000.99[-0.0656886995, -0.0669570863, -0.0480999835, -...Download
3273409.6809374[2548, 4715, 6629, 8506, 10362, 12386, 14600, 1...[1.3461916447, 1.3117240667, 1.328135252, 1.263...0.973295.81668997100[15000, 30000, 45000, 60000, 75000, 90000, 1050...7340968.09374InvertedDoublePendulum-v1...[0.0442264564, 0.0769954398, 0.005970038, 0.050...0.4222368304[14.6896369457, 27.525687933, 40.2733168602, 52...0.115000497.4569110870.01True300True950.0dev[53.3233776124, 62.9650133305, 71.531502896, 72...50000.99[-0.0656886995, -0.1045783237, -0.0159327146, -...Download
3376038.5110219[2548, 4715, 6739, 8637, 10329, 11838, 13190, 1...[1.3461916447, 1.3601952791, 1.17608881, 1.0612...0.973263.16739011100[15000, 30000, 45000, 60000, 75000, 90000, 1050...7603851.10219InvertedDoublePendulum-v1...[0.0442264564, 0.0305604525, 0.0454002805, 0.03...-0.13421736[14.2480502129, 26.5600471497, 39.2269990444, 5...0.115000528.237941980.01True300True950.0dev[53.3233776124, 62.9650133305, 67.5444286478, 7...50000.99[-0.0656886995, -0.0600903481, -0.0479769893, -...Download
3476187.9086533[2548, 4715, 6740, 8608, 10246, 11757, 13172, 1...[1.3461916447, 1.3620091677, 1.1782253981, 1.11...0.973225.26936102100[15000, 30000, 45000, 60000, 75000, 90000, 1050...7618790.86533InvertedDoublePendulum-v1...[0.0442264564, 0.0294408388, 0.0472331308, 0.04...-0.1553174179[14.6142070293, 26.6663150787, 38.6333830357, 5...0.115000526.1596848970.01True300True950.0dev[53.3233776124, 62.9650133305, 67.5024565195, 7...50000.99[-0.0656886995, -0.058292754, -0.0406474359, -0...Download
3582671.1649278[2548, 4715, 6619, 8647, 10973, 13414, 15734, 1...[1.3461916447, 1.3000000715, 1.3523418903, 1.33...0.973288.90657616100[15000, 30000, 45000, 60000, 75000, 90000, 1050...8267116.49278InvertedDoublePendulum-v1...[0.0442264564, 0.0935923755, 0.10140948, 0.0192...0.556955875[14.409072876, 25.9391000271, 37.774600029, 49....0.115000558.5510358810.01True300True950.0dev[53.3233776124, 62.9650133305, 71.9288365138, 6...50000.99[-0.0656886995, -0.1143587753, -0.0192949567, 0...Download
3683607.1830903[2548, 4715, 6609, 8567, 10778, 12945, 15213, 1...[1.3461916447, 1.2985354662, 1.1616353989, 1.04...0.973274.56354308100[15000, 30000, 45000, 60000, 75000, 90000, 1050...8360718.30903InvertedDoublePendulum-v1...[0.0442264564, 0.095828861, 0.1157105491, 0.079...0.5738103751[14.0255861282, 25.2666771412, 36.4669020176, 4...0.115000575.6435031890.01True300True950.0dev[53.3233776124, 62.9650133305, 72.3119321249, 6...50000.99[-0.0656886995, -0.1155517176, -0.0460243821, 0...Download
3787962.2391482[2548, 4715, 6788, 8705, 10456, 12107, 13600, 1...[1.3461916447, 1.3716187477, 1.1879911423, 1.13...0.973243.85556889100[15000, 30000, 45000, 60000, 75000, 90000, 1050...8796223.91482InvertedDoublePendulum-v1...[0.0442264564, 0.0242804792, 0.0469736233, 0.03...-0.2657422122[14.3869740963, 26.6804921627, 38.7675740719, 5...0.115000606.5989580150.01True300True950.0dev[53.3233776124, 62.9650133305, 65.9220079379, 7...50000.99[-0.0656886995, -0.0487769432, -0.0440099202, -...Download